//gender_name_build 
//generate gender distribution by first name

****INSTRUCTIONS*****
//For latest data: download all files from: https://www.ssa.gov/oact/babynames/limits.html
//our analysis: uses May 5, 2019 version of the data 
//this analysis uses SQL-- we used BigQuery

****DO****
//1.Save all the files in a table called name_gender
//2.Run the below code block
/*
SELECT name, SUM(CASE WHEN gender = 'F' THEN frequency ELSE 0 END) / SUM(frequency) AS percent_female, SUM(frequency) total_frequency
FROM `patents.name_gender` 
GROUP BY name
*/

//save output file as all_gender_name.csv
